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4 <110> APPLICANT: Dunn-ColemaO; Nigel 

5 Goedegebuur, Frits 

6 Ward, Michael 

7 Yao, Jian 

9 <120> TITLE OF INVENTION: EGVI Endoglucanase and Nucleic Acids 
10 Encoding the Same 

12 <130> FILE REFERENCE: GC698 

14 <140> CURRENT APPLICATION NUMBER: US 10/026,994 

15 <141> CURRENT FILING DATE: J^2-0^30 

17 <160> NUMBER OF SEQ ID NOS :( 4 )v-^ 

19 <170> SOFTWARE: FastSEQ forHn.ndows Version 4.0 

21 <210> SEQ ID NO: 1 

22 <211> LENGTH: 2710 

23 <212> TYPE: DNA 

24 <213> ORGANISM: Trichoderma reesei 

26 <400> SEQUENCE: 1 

27 ccacgcgtcc gagcagtgtc ctcctcctca ctgcttcgtc atgaaggtct ctcgagtcct 60 

28 tgcccttgtc ctgggggccg tcatccctgc ccatgctgcc ttttcatgga agaacgtcaa 120 

29 gctcggcggc ggcggcggct tcgtccccgg catcatcttc catcccaaga caaaaggcgt 180 

30 agcatatgca cgaacagata ttggcgggct gtaccgcctc aacgccgacg actcatggac 240 

31 cgccgtcacg gatgggattg ctgataatgc cggctggcac aactggggca tcgacgctgt 300 

32 tgcgcttgat ccgcaggacg atcaaaaggt gtatgccgca gtcggcatgt atacgaacag 360 

33 ctgggatccg agtaatggag ccatcattcg ctcgtcagac cgcggcgcaa cgtggtcctt 42 0 

34 caccaacttg cccttcaaag tcgggggtaa catgccagga cgcggagccg gagagcgtct 480 

35 ggctgtcgat ccggccaact ccaacatcat ctactttggt gctcgctcag gaaacggcct 540 

36 ctggaagtct acggacggcg gcgtgacctt ttccaaggtc tcgtcgttca cggcaactgg 600 

37 gacgtacatc ccagacccga gtgattccaa cggctacaac agcgacaagc aaggactcat 660 

38 gtgggttacg ttcgactcaa ccagcagcac gaccggggga gccacgtctc gtatctttgt 720 

39 tggcacggct gataacatca ctgcttcagt ctatgtgagc acgaatgccg gctccacgtg 780 

40 gagtgctgta ccggggcagc cagggaaata ctttcctcac aaggcgaaac tgcagccagc 84 0 

41 agagaaggcc ttgtatctga cctattccga tggcacaggg ccgtatgatg gcacacttgg 900 

42 ctcagtgtgg aggtacgaca ttgcaggggg aacttggaaa gacatcaccc ctgtctctgg 960 

43 atcagatcta tactttggct ttggcggcct tggcctcgat ttgcaaaagc caggaaccct 1020 

44 tgttgttgct tctttgaact cttggtggcc agatgctcag ctgtttcggt cgaccgactc 1080 

45 tgggacaaca tggagcccga tctgggcgtg ggcgagctat ccgactgaga cctattacta 1140 

46 cagcatctca actcccaaag caccgtggat caagaacaac tttatcgatg tgacgagcga 1200 

47 gtcaccgtcc gatggtctca tcaagcgcct cggctggatg attgagtctc tcgagattga 1260 

48 cccaaccgac agcaaccact ggctctacgg caccggaatg acaatctttg gcggccacga 1320 

49 tctcaccaac tgggacacgc gccacaatgt gtcaatccaa tcactggcag acggcatcga 1380 

50 ggaattctcc gtccaggacc tggcctctgc acccggcgga agcgagctat tggccgcagt 1440 

51 cggagacgac aacggcttca cctttgccag cagaaacgac ctcgggacat cgccgcagac 1500 

52 ggtctgggca acgcccacat gggccacctc gacgagcgtc gactacgccg ggaactcggt 1560 

53 caagagcgtc gtccgcgtcg gcaacaccgc cggcacgcaa caggtggcca tctcgtccga 1620 
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54 cggcggcgcg acgtggagca tcgactacgc ggccgacacg tccatgaacg 

55 ggcctattcg gccgacggcg acacgatcct ctggtcgacc gcctcgtccg 

56 ctcgcagttc cagggcagct ttgcctccgt ctcgagcctg cccgcgggcg 

57 ctcggacaag aagaccaaca gcgtcttcta cgccggctcc ggatcgacct 

58 caaggacacc ggcagcagct tcacgcgcgg gcccaagctg ggcagcgcag 

59 ggatatcgct gctcacccga ccaccgcggg cacgttgtat gtctcgaccg 

60 attccgctcc acagactcgg gcacgacctt tggccaagtc tccaccgccc 

61 ctaccagatc gccctgggtg tgggctcagg ctcgaactgg aacctgtatg 

62 cggcccgtca ggggctcgcc tctacgccag tggagacagc ggcgcctcct 

63 ccagggctcc cagggcttcg gctccatcga cagcaccaag gtcgccggca 

64 cgccgggcaa gtctacgtgg gcaccaacgg ccggggcgtc ttttacgctc 

65 cggcggcggc acgggcggga cttcctcgtc gaccaagcag agcagcagca 

66 cgccagctcg agcaccacgc tgaggtcgag cgttgtatcc acgacccggg 

67 gacttcgtcg aggaccagct cggccgccgg tcccacgggg tcaggggtcg 

68 tgctcagtgc ggagggattg ggtggacggg gccgacgcag tgtgtggcgc 

69 ccagaagcag aatgattatt actaccagtg tgtgtgatgc ttgaactgcc 

70 ggagagctac atacccctag gctcgcagta aagagctcaa gcatccgaag 

71 agtagagatc cagtcagata attatccatt tgtttgaatt aaatgatctt 

72 aaaaaaaaaa 

74 <210> SEQ ID NO: 2 

75 <211> LENGTH: 818 

76 <212> TYPE: PRT 

77 <213> ORGANISM: Trichoderma reesei 
79 <400> SEQUENCE: 2 
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100 Val Ser Ser Phe Thr Ala Thr Gly Thr Tyr He Pro Asp Pro Ser Asp 

101 165 170 175 

102 Ser Asn Gly Tyr Asn Ser Asp Lys Gin Gly Leu Met Trp Val Thr Phe 

103 180 185 190 

104 Asp Ser Thr Ser Ser Thr Thr Gly Gly Ala Thr Ser Arg He Phe Val 



gcggcacggt 1680 

gcgtgcagcg 1740 

ccgtcatcgc 1800 

tttacgtcag 1860 

ggacgatccg 1920 

acgtcggcat 1980 

tgaccaacac 2040 

ccttcggcac 2100 

ggacggacat 2160 

gcggcagcac 2220 

agggaaccgt 2280 

gtacctcttc 2340 

cttcgacggt 24 00 

ccggtcatta 2460 

cgtatgtctg 2520 

aagctcacga 2580 

aagcactagt 2640 

ctattgaaaa 2700 
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182 Cys val 

185 <210> SEQ ID NO: 3 

186 <211> LENGTH: 19 

187 <212> TYPE: PRT 

188 <213> ORGANISM: Trichoderma reesei 

190 <400> SEQUENCE: 3 

191 Met Lys Val Ser Arg Val Leu Ala Leu Val Leu Gly Ala Val He Pro 

192 15 10 15 

193 Ala His Ala 

196 <210> SEQ ID NO: 4 

197 <211> LENGTH: 2517 

198 <212> TYPE: DNA 

199 <213> ORGANISM: Trichoderma reesei 

201 <400> SEQUENCE: 4 

202 atgaaggtct ctcgagtcct tgcccttgtc ctgggggccg tcatccctgc ccatgctgcc 60 

203 ttttcatgga agaacgtcaa gctcggcggc ggcggcggct tcgtccccgg catcatcttc 120 

204 catcccaaga caaaaggcgt agcatatgca cgaacagata ttggcgggct gtaccgcctc 180 

205 aacgccgacg actcatggac cgccgtcacg gatgggattg ctgataatgc cggctggcac 240 

206 aactggggca tcgacgctgt tgcgcttgat ccgcaggacg atcaaaaggt gtatgccgca 300 

207 gtcggcatgt atacgaacag ctgggatccg agtaatggag ccatcattcg ctcgtcagac 360 

208 cgcggcgcaa cgtggtcctt caccaacttg cccttcaaag tcgggggtaa catgccagga 420 
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209 cgcggagccg gagagcgtct ggctgtcgat ccggccaact ccaacatcat ctactttggt 

210 gctcgctcag gaaacggcct ctggaagtct acggacggcg gcgtgacctt ttccaaggtc 

211 tcgtcgttca cggcaactgg gacgtacatc ccagacccga gtgattccaa cggctacaac 

212 agcgacaagc aaggactcat gtgggttacg ttcgactcaa ccagcagcac gaccggggga 

213 gccacgtctc gtatctttgt tggcacggct gataacatca ctgcttcagt ctatgtgagc 

214 acgaatgccg gctccacgtg gagtgctgta ccggggcagc cagggaaata ctttcctcac 

215 aaggcgaaac tgcagccagc agagaaggcc ttgtatctga cctattccga tggcacaggg 

216 ccgtatgatg gcacacttgg ctcagtgtgg aggtacgaca ttgcaggggg aacttggaaa 

217 gacatcaccc ctgtctctgg atcagatcta tactttggct ttggcggcct tggcctcgat 

218 ttgcaaaagc caggaaccct tgttgttgct tctttgaact cttggtggcc agatgctcag 

219 ctgtttcggt cgaccgactc tgggacaaca tggagcccga tctgggcgtg ggcgagctat 

220 ccgactgaga cctattacta cagcatctca actcccaaag caccgtggat caagaacaac 

221 tttatcgatg tgacgagcga gtcaccgtcc gatggtctca tcaagcgcct cggctggatg 

222 attgagtctc tcgagattga cccaaccgac agcaaccact ggctctacgg caccggaatg 

223 acaatctttg gcggccacga tctcaccaac tgggacacgc gccacaatgt gtcaatccaa 

224 tcactggcag acggcatcga ggaattctcc gtccaggacc tggcctctgc acccggcgga 

225 agcgagctat tggccgcagt cggagacgac aacggcttca cctttgccag cagaaacgac 

226 ctcgggacat cgccgcagac ggtctgggca acgcccacat gggccacctc gacgagcgtc 

227 gactacgccg ggaactcggt caagagcgtc gtccgcgtcg gcaacaccgc cggcacgcaa 

228 caggtggcca tctcgtccga cggcggcgcg acgtggagca tcgactacgc ggccgacacg 
2 29 tccatgaacg gcggcacggt ggcctattcg gccgacggcg acacgatcct ctggtcgacc 

230 gcctcgtccg gcgtgcagcg ctcgcagttc cagggcagct ttgcctccgt ctcgagcctg 

231 cccgcgggcg ccgtcatcgc ctcggacaag aagaccaaca gcgtcttcta cgccggctcc 

232 ggatcgacct tttacgtcag caaggacacc ggcagcagct tcacgcgcgg gcccaagctg 

233 ggcagcgcag ggacgatccg ggatatcgct gctcacccga ccaccgcggg cacgttgtat 

234 gtctcgaccg acgtcggcat attccgctcc acagactcgg gcacgacctt tggccaagtc 

235 tccaccgccc tgaccaacac ctaccagatc gccctgggtg tgggctcagg ctcgaactgg 
2 36 aacctgtatg ccttcggcac cggcccgtca ggggctcgcc tctacgccag tggagacagc 

237 ggcgcctcct ggacggacat ccagggctcc cagggcttcg gctccatcga cagcaccaag 

238 gtcgccggca gcggcagcac cgccgggcaa gtctacgtgg gcaccaacgg ccggggcgtc 

239 ttttacgctc agggaaccgt cggcggcggc acgggcggga cttcctcgtc gaccaagcag 

240 agcagcagca gtacctcttc cgccagctcg agcaccacgc tgaggtcgag cgttgtatcc 

241 acgacccggg cttcgacggt gacttcgtcg aggaccagct cggccgccgg tcccacgggg 

242 tcaggggtcg ccggtcatta tgctcagtgc ggagggattg ggtggacggg gccgacgcag 

243 tgtgtggcgc cgtatgtctg ccagaagcag aatgattatt actaccagtg tgtgtga 
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